Candace Savonen - CCDL for ALSF

This notebook sets up the MAF data files for comparison and does some first line analyses.

It is the first notebook in this series which addresses issue # 30 in OpenPBTA.

Usage

To run this from the command line, use:

Rscript -e "rmarkdown::render('analyses/mutect2-vs-strelka2/01-set-up.Rmd', 
                              clean = TRUE)"

This assumes you are in the top directory of the repository.

Set Up

# We need maftools - this will be added to the running Docker issue whenever it is up
if (!("maftools" %in% installed.packages())) {
  devtools::install_github("PoisonAlien/maftools")
}

Get magrittr pipe

`%>%` <- dplyr::`%>%`

Directories and files

Path to the symlinked data obtained via bash download-data.sh.

data_dir <- file.path("..", "..", "data")
scratch_dir <- file.path("..", "..", "scratch")

Create output directories in this analysis folder.

if (!dir.exists("results")) {
  dir.create("results")
}
if (!dir.exists("plots")) {
  dir.create("plots")
}

Read in the metadata information

Running maftools::read.maf takes a lot of computing power and time, so to avoid having to run this for both datasets everytime we want to re-run this notebook or the analyses in the other notebook, I’ve set this up to save the MAF objects as RDS files.

First let’s establish the file paths.

# File paths for the needed files for this analysis
  metadata_dir <- file.path(scratch_dir, "metadata_filtered_maf_samples.tsv")
strelka2_dir <- file.path(scratch_dir, "strelka2.RDS")
mutect2_dir <- file.path(scratch_dir, "mutect2.RDS")

Read in the Strelka2 and Mutect2 data

Will read in as an maftools object from an RDS file, unless maftools has not been run on them yet. Establish whether the files we need for this already exist before running it again.

If you trying to run the set up step in a Docker container, it will likely be out of memory killed, unless you have ~50GB you can allot to Docker.

Prep the metadata to be used as the clinicalData for maftools it it hasn’t been prepped yet.

# Get a vector of whether these exist
files_needed <- file.exists(metadata_dir, strelka2_dir, mutect2_dir)

if (all(files_needed)) {
  # Read the ready-to-go files if these files exist
  metadata <- metadata <- readr::read_tsv(metadata_dir)
  strelka2 <- readRDS(strelka2_dir)
  mutect2 <- readRDS(mutect2_dir)
} else { # If any of the needed files don't exist, rerun this process:
  # Only import the sample names
  strelka2_samples <- data.table::fread(file.path(
    data_dir,
    "pbta-snv-strelka2.vep.maf.gz"
  ),
  select = "Tumor_Sample_Barcode",
  skip = 1,
  data.table = FALSE
  )

  mutect2_samples <- data.table::fread(file.path(
    data_dir,
    "pbta-snv-mutect2.vep.maf.gz"
  ),
  select = "Tumor_Sample_Barcode",
  skip = 1,
  data.table = FALSE
  )

  # Isolate metadata to only the samples that are in the datasets
  metadata <- readr::read_tsv(data_dir, "pbta-histologies.tsv") %>%
    dplyr::filter(Kids_First_Biospecimen_ID %in% c(strelka2_samples, mutect2_samples)) %>%
    dplyr::distinct(Kids_First_Biospecimen_ID, .keep_all = TRUE) %>%
    dplyr::arrange() %>%
    readr::write_tsv(file.path(scratch_dir, "metadata_filtered_maf_samples.tsv"))

  # Read in original strelka file with maftools
  strelka <- maftools::read.maf(file.path(data_dir, "pbta-snv-strelka2.vep.maf.gz"),
    clinicalData = metadata
  )

  # Save to RDS so we don't have to run this again
  saveRDS(strelka, strelka2_dir)

  # Same for MuTect2
  mutect2 <- maftools::read.maf(file.path(data_dir, "pbta-snv-mutect2.vep.maf.gz"),
    clinicalData = metadata
  )
  saveRDS(mutect2, mutect2_dir)
}
Parsed with column specification:
cols(
  .default = col_character(),
  age_at_diagnosis = col_double(),
  molecular_subtype = col_logical()
)
See spec(...) for full column specifications.

Get summaries and write them to TSVs

Get gene summaries and write to TSV files.

strelka2_gene_sum <- maftools::getGeneSummary(strelka2) %>%
  readr::write_tsv(file.path(
    "results",
    "strelka2_gene_summary.tsv"
  ))

mutect2_gene_sum <- maftools::getGeneSummary(mutect2) %>%
  readr::write_tsv(file.path(
    "results",
    "mutect2_gene_summary.tsv"
  ))

Get sample summaries and write to TSV files.

strelka2_sample_sum <- maftools::getSampleSummary(strelka2) %>%
  readr::write_tsv(file.path(
    "results",
    "strelka2_sample_summary.tsv"
  ))

mutect2_sample_sum <- maftools::getSampleSummary(mutect2) %>%
  readr::write_tsv(file.path(
    "results",
    "mutect2_sample_summary.tsv"
  ))

Number of mutations per gene correlation

combined_gene <- mutect2_gene_sum %>%
  dplyr::full_join(strelka2_gene_sum, by = "Hugo_Symbol") %>%
  reshape2::melt(id = "Hugo_Symbol") %>%
  dplyr::mutate(dataset = as.character(grepl(".x$", variable))) %>%
  dplyr::mutate(dataset = dplyr::recode(dataset,
    `TRUE` = "mutect2",
    `FALSE` = "strelka2"
  )) %>%
  dplyr::mutate(variable = gsub(".x$|.y$", "", variable)) %>%
  tidyr::spread("dataset", "value")

Let’s get a correlation test on the genes overall.

cor.test(combined_gene$mutect2, combined_gene$strelka2, method = "spearman")
Cannot compute exact p-value with ties

    Spearman's rank correlation rho

data:  combined_gene$mutect2 and combined_gene$strelka2
S = 4.7233e+13, p-value < 2.2e-16
alternative hypothesis: true rho is not equal to 0
sample estimates:
      rho 
0.9568251 
cor.test(combined_gene$mutect2, combined_gene$strelka2, method = "pearson")

    Pearson's product-moment correlation

data:  combined_gene$mutect2 and combined_gene$strelka2
t = 567.61, df = 187234, p-value < 2.2e-16
alternative hypothesis: true correlation is not equal to 0
95 percent confidence interval:
 0.7935980 0.7969277
sample estimates:
      cor 
0.7952689 

Number of mutations per sample correlation.

combined_sample <- mutect2_sample_sum %>%
  dplyr::full_join(strelka2_sample_sum, by = "Tumor_Sample_Barcode") %>%
  reshape2::melt(id = "Tumor_Sample_Barcode") %>%
  dplyr::mutate(dataset = as.character(grepl(".x$", variable))) %>%
  dplyr::mutate(dataset = dplyr::recode(dataset,
    `TRUE` = "mutect2",
    `FALSE` = "strelka2"
  )) %>%
  dplyr::mutate(variable = gsub(".x$|.y$", "", variable)) %>%
  tidyr::spread("dataset", "value")

Let’s get a correlation test on the genes overall.

cor.test(combined_sample$mutect2, combined_sample$strelka2, method = "spearman")
Cannot compute exact p-value with ties

    Spearman's rank correlation rho

data:  combined_sample$mutect2 and combined_sample$strelka2
S = 3.3543e+10, p-value < 2.2e-16
alternative hypothesis: true rho is not equal to 0
sample estimates:
      rho 
0.7808425 
cor.test(combined_sample$mutect2, combined_sample$strelka2, method = "pearson")

    Pearson's product-moment correlation

data:  combined_sample$mutect2 and combined_sample$strelka2
t = 778.22, df = 9718, p-value < 2.2e-16
alternative hypothesis: true correlation is not equal to 0
95 percent confidence interval:
 0.9917519 0.9923801
sample estimates:
      cor 
0.9920722 

Plot Transition/Transversions

maftools::plotTiTv(maftools::titv(strelka2))

maftools::plotTiTv(maftools::titv(mutect2))

Set up new variables

Here we will make these new variables for both Mutect2 and Strelka2 dataset: - Calculate VAF for each - Make a mutation ID by concatenating gene name, allele, tumor ID, and start position - Summarize the biotype variable for whether or not it is a coding gene.

Let’s do this for Strelka2 first.

strelka2_vaf <- strelka2@data %>%
  dplyr::mutate(
    vaf = as.numeric(t_alt_count) / (as.numeric(t_ref_count) +
      as.numeric(t_alt_count)),
    base_change = paste0(Reference_Allele, ">", Allele),
    coding = dplyr::case_when(
      BIOTYPE != "protein_coding" ~ "non-coding",
      TRUE ~ "protein_coding"
    )
  ) %>%
  dplyr::mutate(change = dplyr::case_when(
    grepl("^-", base_change) ~ "insertion",
    grepl("-$", base_change) ~ "deletion",
    nchar(base_change) > 3 ~ "long_change",
    TRUE ~ base_change
  )) %>%
  dplyr::mutate(
    mutation_id = paste0(
      Hugo_Symbol, "_",
      change, "_",
      Start_Position, "_",
      Tumor_Sample_Barcode
    ),
    general_id = paste0(Hugo_Symbol, "_", Tumor_Sample_Barcode)
  ) %>%
  dplyr::select(-which(apply(is.na(.), 2, all)))
NAs introduced by coercion
# Take a look at this df
strelka2_vaf

Now we will do the same for MuTect2.

mutect2_vaf <- mutect2@data %>%
  dplyr::mutate(
    vaf = as.numeric(t_alt_count) / (as.numeric(t_ref_count) +
      as.numeric(t_alt_count)),
    base_change = paste0(Reference_Allele, ">", Allele),
    coding = dplyr::case_when(
      BIOTYPE != "protein_coding" ~ "non-coding",
      TRUE ~ "protein_coding"
    )
  ) %>%
  dplyr::mutate(change = dplyr::case_when(
    grepl("^-", base_change) ~ "insertion",
    grepl("-$", base_change) ~ "deletion",
    nchar(base_change) > 3 ~ "long_change",
    TRUE ~ base_change
  )) %>%
  dplyr::mutate(
    mutation_id = paste0(
      Hugo_Symbol, "_",
      change, "_",
      Start_Position, "_",
      Tumor_Sample_Barcode
    ),
    general_id = paste0(Hugo_Symbol, "_", Tumor_Sample_Barcode)
  ) %>%
  dplyr::select(-which(apply(is.na(.), 2, all)))

# Take a look at this df
mutect2_vaf

Combine MuTect2 and Strelka2 data.frames into one data.frame

Save to a TSV file.

# Merge these data.frames together
vaf_df <- strelka2_vaf %>%
  dplyr::full_join(mutect2_vaf,
    by = "mutation_id",
    suffix = c(".strelka2", ".mutect2")
  ) %>%
  # Make a variable that denotes which dataset it is in.
  dplyr::mutate(dataset = dplyr::case_when(
    is.na(Allele.mutect2) ~ "strelka2_only",
    is.na(Allele.strelka2) ~ "mutect2_only",
    TRUE ~ "both"
  )) %>%
  readr::write_tsv(file.path("results", "combined_results.tsv"))

Session Info:

sessionInfo()
R version 3.6.1 (2019-07-05)
Platform: x86_64-apple-darwin15.6.0 (64-bit)
Running under: macOS Mojave 10.14.5

Matrix products: default
BLAS:   /System/Library/Frameworks/Accelerate.framework/Versions/A/Frameworks/vecLib.framework/Versions/A/libBLAS.dylib
LAPACK: /Library/Frameworks/R.framework/Versions/3.6/Resources/lib/libRlapack.dylib

locale:
[1] en_US.UTF-8/en_US.UTF-8/en_US.UTF-8/C/en_US.UTF-8/en_US.UTF-8

attached base packages:
[1] parallel  stats     graphics  grDevices utils     datasets  methods   base     

other attached packages:
[1] Biobase_2.44.0      BiocGenerics_0.30.0

loaded via a namespace (and not attached):
 [1] pkgload_1.0.2        tidyr_0.8.3          splines_3.6.1        jsonlite_1.6        
 [5] foreach_1.4.7        assertthat_0.2.1     yaml_2.2.0           remotes_2.1.0       
 [9] sessioninfo_1.1.1    lattice_0.20-38      pillar_1.4.2         backports_1.1.4     
[13] glue_1.3.1           digest_0.6.20        RColorBrewer_1.1-2   colorspace_1.4-1    
[17] Matrix_1.2-17        htmltools_0.3.6      plyr_1.8.4           pkgconfig_2.0.2     
[21] devtools_2.1.0       bibtex_0.4.2         purrr_0.3.2          xtable_1.8-4        
[25] scales_1.0.0         processx_3.4.1       VennDiagram_1.6.20   tibble_2.1.3        
[29] pkgmaker_0.27        styler_1.1.1.9003    ggplot2_3.2.1        usethis_1.5.1       
[33] withr_2.1.2          lazyeval_0.2.2       cli_1.1.0            survival_2.44-1.1   
[37] magrittr_1.5         crayon_1.3.4         memoise_1.1.0        evaluate_0.14       
[41] ps_1.3.0             fs_1.3.1             doParallel_1.0.15    NMF_0.21.0          
[45] pkgbuild_1.0.4       tools_3.6.1          registry_0.5-1       data.table_1.12.2   
[49] prettyunits_1.0.2    hms_0.5.0            formatR_1.7          gridBase_0.4-7      
[53] stringr_1.4.0        munsell_0.5.0        cluster_2.1.0        rngtools_1.4        
[57] lambda.r_1.2.3       maftools_2.0.15      callr_3.3.1          compiler_3.6.1      
[61] rlang_0.4.0          futile.logger_1.4.3  grid_3.6.1           iterators_1.0.12    
[65] rstudioapi_0.10      colorblindr_0.1.0    base64enc_0.1-3      rmarkdown_1.14      
[69] testthat_2.2.1       gtable_0.3.0         codetools_0.2-16     curl_4.0            
[73] rematch2_2.1.0       reshape2_1.4.3       R6_2.4.0             knitr_1.24          
[77] dplyr_0.8.3          zeallot_0.1.0        rprojroot_1.3-2      futile.options_1.0.1
[81] readr_1.3.1          desc_1.2.0           stringi_1.4.3        Rcpp_1.0.2          
[85] vctrs_0.2.0          wordcloud_2.6        tidyselect_0.2.5     xfun_0.8            
LS0tCnRpdGxlOiAiU2V0IHVwIGNvbWJpbmVkIGRhdGEgb2YgTXV0ZWN0MiBhbmQgU3RyZWxrYTIiCm91dHB1dDogICAKICBodG1sX25vdGVib29rOiAKICAgIHRvYzogdHJ1ZQogICAgdG9jX2Zsb2F0OiB0cnVlCi0tLQoKQ2FuZGFjZSBTYXZvbmVuIC0gQ0NETCBmb3IgQUxTRgoKVGhpcyBub3RlYm9vayBzZXRzIHVwIHRoZSBNQUYgZGF0YSBmaWxlcyBmb3IgY29tcGFyaXNvbiBhbmQgZG9lcyBzb21lIGZpcnN0IApsaW5lIGFuYWx5c2VzLgoKSXQgaXMgdGhlIGZpcnN0IG5vdGVib29rIGluIHRoaXMgc2VyaWVzIHdoaWNoIGFkZHJlc3NlcyBbaXNzdWUgXCMgMzAgaW4gT3BlblBCVEFdKGh0dHBzOi8vZ2l0aHViLmNvbS9BbGV4c0xlbW9uYWRlL09wZW5QQlRBLWFuYWx5c2lzL2lzc3Vlcy8zMCkuCgojIyBVc2FnZQoKVG8gcnVuIHRoaXMgZnJvbSB0aGUgY29tbWFuZCBsaW5lLCB1c2U6CmBgYApSc2NyaXB0IC1lICJybWFya2Rvd246OnJlbmRlcignYW5hbHlzZXMvbXV0ZWN0Mi12cy1zdHJlbGthMi8wMS1zZXQtdXAuUm1kJywgCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGNsZWFuID0gVFJVRSkiCmBgYAoKIF9UaGlzIGFzc3VtZXMgeW91IGFyZSBpbiB0aGUgdG9wIGRpcmVjdG9yeSBvZiB0aGUgcmVwb3NpdG9yeS5fCgojIyBTZXQgVXAKCmBgYHtyfQojIFdlIG5lZWQgbWFmdG9vbHMgLSB0aGlzIHdpbGwgYmUgYWRkZWQgdG8gdGhlIHJ1bm5pbmcgRG9ja2VyIGlzc3VlIHdoZW5ldmVyIGl0IGlzIHVwCmlmICghKCJtYWZ0b29scyIgJWluJSBpbnN0YWxsZWQucGFja2FnZXMoKSkpIHsKICBkZXZ0b29sczo6aW5zdGFsbF9naXRodWIoIlBvaXNvbkFsaWVuL21hZnRvb2xzIikKfQpgYGAKCkdldCBgbWFncml0dHJgIHBpcGUKCmBgYHtyfQpgJT4lYCA8LSBkcGx5cjo6YCU+JWAKYGBgCgojIyMgRGlyZWN0b3JpZXMgYW5kIGZpbGVzCgpQYXRoIHRvIHRoZSBzeW1saW5rZWQgZGF0YSBvYnRhaW5lZCB2aWEgYGJhc2ggZG93bmxvYWQtZGF0YS5zaGAuCgpgYGB7cn0KZGF0YV9kaXIgPC0gZmlsZS5wYXRoKCIuLiIsICIuLiIsICJkYXRhIikKc2NyYXRjaF9kaXIgPC0gZmlsZS5wYXRoKCIuLiIsICIuLiIsICJzY3JhdGNoIikKYGBgCgpDcmVhdGUgb3V0cHV0IGRpcmVjdG9yaWVzIGluIHRoaXMgYW5hbHlzaXMgZm9sZGVyLgoKYGBge3J9CmlmICghZGlyLmV4aXN0cygicmVzdWx0cyIpKSB7CiAgZGlyLmNyZWF0ZSgicmVzdWx0cyIpCn0KaWYgKCFkaXIuZXhpc3RzKCJwbG90cyIpKSB7CiAgZGlyLmNyZWF0ZSgicGxvdHMiKQp9CmBgYAoKIyMgUmVhZCBpbiB0aGUgbWV0YWRhdGEgaW5mb3JtYXRpb24KClJ1bm5pbmcgYG1hZnRvb2xzOjpyZWFkLm1hZmAgdGFrZXMgYSBsb3Qgb2YgY29tcHV0aW5nIHBvd2VyIGFuZCB0aW1lLCBzbyB0byAKYXZvaWQgaGF2aW5nIHRvIHJ1biB0aGlzIGZvciBib3RoIGRhdGFzZXRzIGV2ZXJ5dGltZSB3ZSB3YW50IHRvIHJlLXJ1biB0aGlzIApub3RlYm9vayBvciB0aGUgYW5hbHlzZXMgaW4gdGhlIG90aGVyIG5vdGVib29rLCBJJ3ZlIHNldCB0aGlzIHVwIHRvIHNhdmUgdGhlIApgTUFGYCBvYmplY3RzIGFzIGBSRFNgIGZpbGVzLgoKRmlyc3QgbGV0J3MgZXN0YWJsaXNoIHRoZSBmaWxlIHBhdGhzLgoKYGBge3J9CiMgRmlsZSBwYXRocyBmb3IgdGhlIG5lZWRlZCBmaWxlcyBmb3IgdGhpcyBhbmFseXNpcwogIG1ldGFkYXRhX2RpciA8LSBmaWxlLnBhdGgoc2NyYXRjaF9kaXIsICJtZXRhZGF0YV9maWx0ZXJlZF9tYWZfc2FtcGxlcy50c3YiKQpzdHJlbGthMl9kaXIgPC0gZmlsZS5wYXRoKHNjcmF0Y2hfZGlyLCAic3RyZWxrYTIuUkRTIikKbXV0ZWN0Ml9kaXIgPC0gZmlsZS5wYXRoKHNjcmF0Y2hfZGlyLCAibXV0ZWN0Mi5SRFMiKQpgYGAKCiMjIFJlYWQgaW4gdGhlIFN0cmVsa2EyIGFuZCBNdXRlY3QyIGRhdGEKCldpbGwgcmVhZCBpbiBhcyBhbiBgbWFmdG9vbHNgIG9iamVjdCBmcm9tIGFuIFJEUyBmaWxlLCB1bmxlc3MgYG1hZnRvb2xzYCBoYXMgbm90CmJlZW4gcnVuIG9uIHRoZW0geWV0LgpFc3RhYmxpc2ggd2hldGhlciB0aGUgZmlsZXMgd2UgbmVlZCBmb3IgdGhpcyBhbHJlYWR5IGV4aXN0IGJlZm9yZSBydW5uaW5nIGl0IAphZ2Fpbi4gCgpJZiB5b3UgdHJ5aW5nIHRvIHJ1biB0aGUgc2V0IHVwIHN0ZXAgaW4gYSBEb2NrZXIgY29udGFpbmVyLCBpdCB3aWxsIGxpa2VseSBiZSAKb3V0IG9mIG1lbW9yeSBraWxsZWQsIHVubGVzcyB5b3UgaGF2ZSB+NTBHQiB5b3UgY2FuIGFsbG90IHRvIERvY2tlci4gCgpQcmVwIHRoZSBtZXRhZGF0YSB0byBiZSB1c2VkIGFzIHRoZSBgY2xpbmljYWxEYXRhYCBmb3IgbWFmdG9vbHMgaXQgaXQgaGFzbid0IGJlZW4gCnByZXBwZWQgeWV0LiAKCmBgYHtyfQojIEdldCBhIHZlY3RvciBvZiB3aGV0aGVyIHRoZXNlIGV4aXN0CmZpbGVzX25lZWRlZCA8LSBmaWxlLmV4aXN0cyhtZXRhZGF0YV9kaXIsIHN0cmVsa2EyX2RpciwgbXV0ZWN0Ml9kaXIpCgppZiAoYWxsKGZpbGVzX25lZWRlZCkpIHsKICAjIFJlYWQgdGhlIHJlYWR5LXRvLWdvIGZpbGVzIGlmIHRoZXNlIGZpbGVzIGV4aXN0CiAgbWV0YWRhdGEgPC0gbWV0YWRhdGEgPC0gcmVhZHI6OnJlYWRfdHN2KG1ldGFkYXRhX2RpcikKICBzdHJlbGthMiA8LSByZWFkUkRTKHN0cmVsa2EyX2RpcikKICBtdXRlY3QyIDwtIHJlYWRSRFMobXV0ZWN0Ml9kaXIpCn0gZWxzZSB7ICMgSWYgYW55IG9mIHRoZSBuZWVkZWQgZmlsZXMgZG9uJ3QgZXhpc3QsIHJlcnVuIHRoaXMgcHJvY2VzczoKICAjIE9ubHkgaW1wb3J0IHRoZSBzYW1wbGUgbmFtZXMKICBzdHJlbGthMl9zYW1wbGVzIDwtIGRhdGEudGFibGU6OmZyZWFkKGZpbGUucGF0aCgKICAgIGRhdGFfZGlyLAogICAgInBidGEtc252LXN0cmVsa2EyLnZlcC5tYWYuZ3oiCiAgKSwKICBzZWxlY3QgPSAiVHVtb3JfU2FtcGxlX0JhcmNvZGUiLAogIHNraXAgPSAxLAogIGRhdGEudGFibGUgPSBGQUxTRQogICkKCiAgbXV0ZWN0Ml9zYW1wbGVzIDwtIGRhdGEudGFibGU6OmZyZWFkKGZpbGUucGF0aCgKICAgIGRhdGFfZGlyLAogICAgInBidGEtc252LW11dGVjdDIudmVwLm1hZi5neiIKICApLAogIHNlbGVjdCA9ICJUdW1vcl9TYW1wbGVfQmFyY29kZSIsCiAgc2tpcCA9IDEsCiAgZGF0YS50YWJsZSA9IEZBTFNFCiAgKQoKICAjIElzb2xhdGUgbWV0YWRhdGEgdG8gb25seSB0aGUgc2FtcGxlcyB0aGF0IGFyZSBpbiB0aGUgZGF0YXNldHMKICBtZXRhZGF0YSA8LSByZWFkcjo6cmVhZF90c3YoZGF0YV9kaXIsICJwYnRhLWhpc3RvbG9naWVzLnRzdiIpICU+JQogICAgZHBseXI6OmZpbHRlcihLaWRzX0ZpcnN0X0Jpb3NwZWNpbWVuX0lEICVpbiUgYyhzdHJlbGthMl9zYW1wbGVzLCBtdXRlY3QyX3NhbXBsZXMpKSAlPiUKICAgIGRwbHlyOjpkaXN0aW5jdChLaWRzX0ZpcnN0X0Jpb3NwZWNpbWVuX0lELCAua2VlcF9hbGwgPSBUUlVFKSAlPiUKICAgIGRwbHlyOjphcnJhbmdlKCkgJT4lCiAgICByZWFkcjo6d3JpdGVfdHN2KGZpbGUucGF0aChzY3JhdGNoX2RpciwgIm1ldGFkYXRhX2ZpbHRlcmVkX21hZl9zYW1wbGVzLnRzdiIpKQoKICAjIFJlYWQgaW4gb3JpZ2luYWwgc3RyZWxrYSBmaWxlIHdpdGggbWFmdG9vbHMKICBzdHJlbGthIDwtIG1hZnRvb2xzOjpyZWFkLm1hZihmaWxlLnBhdGgoZGF0YV9kaXIsICJwYnRhLXNudi1zdHJlbGthMi52ZXAubWFmLmd6IiksCiAgICBjbGluaWNhbERhdGEgPSBtZXRhZGF0YQogICkKCiAgIyBTYXZlIHRvIFJEUyBzbyB3ZSBkb24ndCBoYXZlIHRvIHJ1biB0aGlzIGFnYWluCiAgc2F2ZVJEUyhzdHJlbGthLCBzdHJlbGthMl9kaXIpCgogICMgU2FtZSBmb3IgTXVUZWN0MgogIG11dGVjdDIgPC0gbWFmdG9vbHM6OnJlYWQubWFmKGZpbGUucGF0aChkYXRhX2RpciwgInBidGEtc252LW11dGVjdDIudmVwLm1hZi5neiIpLAogICAgY2xpbmljYWxEYXRhID0gbWV0YWRhdGEKICApCiAgc2F2ZVJEUyhtdXRlY3QyLCBtdXRlY3QyX2RpcikKfQpgYGAKCiMjIEdldCBzdW1tYXJpZXMgYW5kIHdyaXRlIHRoZW0gdG8gVFNWcyAKCkdldCBnZW5lIHN1bW1hcmllcyBhbmQgd3JpdGUgdG8gVFNWIGZpbGVzLiAKCmBgYHtyfQpzdHJlbGthMl9nZW5lX3N1bSA8LSBtYWZ0b29sczo6Z2V0R2VuZVN1bW1hcnkoc3RyZWxrYTIpICU+JQogIHJlYWRyOjp3cml0ZV90c3YoZmlsZS5wYXRoKAogICAgInJlc3VsdHMiLAogICAgInN0cmVsa2EyX2dlbmVfc3VtbWFyeS50c3YiCiAgKSkKCm11dGVjdDJfZ2VuZV9zdW0gPC0gbWFmdG9vbHM6OmdldEdlbmVTdW1tYXJ5KG11dGVjdDIpICU+JQogIHJlYWRyOjp3cml0ZV90c3YoZmlsZS5wYXRoKAogICAgInJlc3VsdHMiLAogICAgIm11dGVjdDJfZ2VuZV9zdW1tYXJ5LnRzdiIKICApKQpgYGAKCkdldCBzYW1wbGUgc3VtbWFyaWVzIGFuZCB3cml0ZSB0byBUU1YgZmlsZXMuIAoKYGBge3J9CnN0cmVsa2EyX3NhbXBsZV9zdW0gPC0gbWFmdG9vbHM6OmdldFNhbXBsZVN1bW1hcnkoc3RyZWxrYTIpICU+JQogIHJlYWRyOjp3cml0ZV90c3YoZmlsZS5wYXRoKAogICAgInJlc3VsdHMiLAogICAgInN0cmVsa2EyX3NhbXBsZV9zdW1tYXJ5LnRzdiIKICApKQoKbXV0ZWN0Ml9zYW1wbGVfc3VtIDwtIG1hZnRvb2xzOjpnZXRTYW1wbGVTdW1tYXJ5KG11dGVjdDIpICU+JQogIHJlYWRyOjp3cml0ZV90c3YoZmlsZS5wYXRoKAogICAgInJlc3VsdHMiLAogICAgIm11dGVjdDJfc2FtcGxlX3N1bW1hcnkudHN2IgogICkpCmBgYAoKIyMgTnVtYmVyIG9mIG11dGF0aW9ucyBwZXIgZ2VuZSBjb3JyZWxhdGlvbiAKCmBgYHtyfQpjb21iaW5lZF9nZW5lIDwtIG11dGVjdDJfZ2VuZV9zdW0gJT4lCiAgZHBseXI6OmZ1bGxfam9pbihzdHJlbGthMl9nZW5lX3N1bSwgYnkgPSAiSHVnb19TeW1ib2wiKSAlPiUKICByZXNoYXBlMjo6bWVsdChpZCA9ICJIdWdvX1N5bWJvbCIpICU+JQogIGRwbHlyOjptdXRhdGUoZGF0YXNldCA9IGFzLmNoYXJhY3RlcihncmVwbCgiLngkIiwgdmFyaWFibGUpKSkgJT4lCiAgZHBseXI6Om11dGF0ZShkYXRhc2V0ID0gZHBseXI6OnJlY29kZShkYXRhc2V0LAogICAgYFRSVUVgID0gIm11dGVjdDIiLAogICAgYEZBTFNFYCA9ICJzdHJlbGthMiIKICApKSAlPiUKICBkcGx5cjo6bXV0YXRlKHZhcmlhYmxlID0gZ3N1YigiLngkfC55JCIsICIiLCB2YXJpYWJsZSkpICU+JQogIHRpZHlyOjpzcHJlYWQoImRhdGFzZXQiLCAidmFsdWUiKQpgYGAKCkxldCdzIGdldCBhIGNvcnJlbGF0aW9uIHRlc3Qgb24gdGhlIGdlbmVzIG92ZXJhbGwuCgpgYGB7cn0KY29yLnRlc3QoY29tYmluZWRfZ2VuZSRtdXRlY3QyLCBjb21iaW5lZF9nZW5lJHN0cmVsa2EyLCBtZXRob2QgPSAic3BlYXJtYW4iKQpjb3IudGVzdChjb21iaW5lZF9nZW5lJG11dGVjdDIsIGNvbWJpbmVkX2dlbmUkc3RyZWxrYTIsIG1ldGhvZCA9ICJwZWFyc29uIikKYGBgCgojIyBOdW1iZXIgb2YgbXV0YXRpb25zIHBlciBzYW1wbGUgY29ycmVsYXRpb24uIAoKYGBge3J9CmNvbWJpbmVkX3NhbXBsZSA8LSBtdXRlY3QyX3NhbXBsZV9zdW0gJT4lCiAgZHBseXI6OmZ1bGxfam9pbihzdHJlbGthMl9zYW1wbGVfc3VtLCBieSA9ICJUdW1vcl9TYW1wbGVfQmFyY29kZSIpICU+JQogIHJlc2hhcGUyOjptZWx0KGlkID0gIlR1bW9yX1NhbXBsZV9CYXJjb2RlIikgJT4lCiAgZHBseXI6Om11dGF0ZShkYXRhc2V0ID0gYXMuY2hhcmFjdGVyKGdyZXBsKCIueCQiLCB2YXJpYWJsZSkpKSAlPiUKICBkcGx5cjo6bXV0YXRlKGRhdGFzZXQgPSBkcGx5cjo6cmVjb2RlKGRhdGFzZXQsCiAgICBgVFJVRWAgPSAibXV0ZWN0MiIsCiAgICBgRkFMU0VgID0gInN0cmVsa2EyIgogICkpICU+JQogIGRwbHlyOjptdXRhdGUodmFyaWFibGUgPSBnc3ViKCIueCR8LnkkIiwgIiIsIHZhcmlhYmxlKSkgJT4lCiAgdGlkeXI6OnNwcmVhZCgiZGF0YXNldCIsICJ2YWx1ZSIpCmBgYAoKTGV0J3MgZ2V0IGEgY29ycmVsYXRpb24gdGVzdCBvbiB0aGUgZ2VuZXMgb3ZlcmFsbC4KCmBgYHtyfQpjb3IudGVzdChjb21iaW5lZF9zYW1wbGUkbXV0ZWN0MiwgY29tYmluZWRfc2FtcGxlJHN0cmVsa2EyLCBtZXRob2QgPSAic3BlYXJtYW4iKQpjb3IudGVzdChjb21iaW5lZF9zYW1wbGUkbXV0ZWN0MiwgY29tYmluZWRfc2FtcGxlJHN0cmVsa2EyLCBtZXRob2QgPSAicGVhcnNvbiIpCmBgYAoKIyMgUGxvdCBUcmFuc2l0aW9uL1RyYW5zdmVyc2lvbnMKCmBgYHtyfQptYWZ0b29sczo6cGxvdFRpVHYobWFmdG9vbHM6OnRpdHYoc3RyZWxrYTIpKQpgYGAKCmBgYHtyfQptYWZ0b29sczo6cGxvdFRpVHYobWFmdG9vbHM6OnRpdHYobXV0ZWN0MikpCmBgYAoKIyMgU2V0IHVwIG5ldyB2YXJpYWJsZXMKCkhlcmUgd2Ugd2lsbCBtYWtlIHRoZXNlIG5ldyB2YXJpYWJsZXMgZm9yIGJvdGggTXV0ZWN0MiBhbmQgU3RyZWxrYTIgZGF0YXNldDoKLSBDYWxjdWxhdGUgVkFGIGZvciBlYWNoCi0gTWFrZSBhIG11dGF0aW9uIElEIGJ5IGNvbmNhdGVuYXRpbmcgZ2VuZSBuYW1lLCBhbGxlbGUsIHR1bW9yIElELCBhbmQgc3RhcnQgcG9zaXRpb24KLSBTdW1tYXJpemUgdGhlIGJpb3R5cGUgdmFyaWFibGUgZm9yIHdoZXRoZXIgb3Igbm90IGl0IGlzIGEgY29kaW5nIGdlbmUuIAoKTGV0J3MgZG8gdGhpcyBmb3IgU3RyZWxrYTIgZmlyc3QuIAoKYGBge3J9CnN0cmVsa2EyX3ZhZiA8LSBzdHJlbGthMkBkYXRhICU+JQogIGRwbHlyOjptdXRhdGUoCiAgICB2YWYgPSBhcy5udW1lcmljKHRfYWx0X2NvdW50KSAvIChhcy5udW1lcmljKHRfcmVmX2NvdW50KSArCiAgICAgIGFzLm51bWVyaWModF9hbHRfY291bnQpKSwKICAgIGJhc2VfY2hhbmdlID0gcGFzdGUwKFJlZmVyZW5jZV9BbGxlbGUsICI+IiwgQWxsZWxlKSwKICAgIGNvZGluZyA9IGRwbHlyOjpjYXNlX3doZW4oCiAgICAgIEJJT1RZUEUgIT0gInByb3RlaW5fY29kaW5nIiB+ICJub24tY29kaW5nIiwKICAgICAgVFJVRSB+ICJwcm90ZWluX2NvZGluZyIKICAgICkKICApICU+JQogIGRwbHlyOjptdXRhdGUoY2hhbmdlID0gZHBseXI6OmNhc2Vfd2hlbigKICAgIGdyZXBsKCJeLSIsIGJhc2VfY2hhbmdlKSB+ICJpbnNlcnRpb24iLAogICAgZ3JlcGwoIi0kIiwgYmFzZV9jaGFuZ2UpIH4gImRlbGV0aW9uIiwKICAgIG5jaGFyKGJhc2VfY2hhbmdlKSA+IDMgfiAibG9uZ19jaGFuZ2UiLAogICAgVFJVRSB+IGJhc2VfY2hhbmdlCiAgKSkgJT4lCiAgZHBseXI6Om11dGF0ZSgKICAgIG11dGF0aW9uX2lkID0gcGFzdGUwKAogICAgICBIdWdvX1N5bWJvbCwgIl8iLAogICAgICBjaGFuZ2UsICJfIiwKICAgICAgU3RhcnRfUG9zaXRpb24sICJfIiwKICAgICAgVHVtb3JfU2FtcGxlX0JhcmNvZGUKICAgICksCiAgICBnZW5lcmFsX2lkID0gcGFzdGUwKEh1Z29fU3ltYm9sLCAiXyIsIFR1bW9yX1NhbXBsZV9CYXJjb2RlKQogICkgJT4lCiAgZHBseXI6OnNlbGVjdCgtd2hpY2goYXBwbHkoaXMubmEoLiksIDIsIGFsbCkpKQoKIyBUYWtlIGEgbG9vayBhdCB0aGlzIGRmCnN0cmVsa2EyX3ZhZgpgYGAKCk5vdyB3ZSB3aWxsIGRvIHRoZSBzYW1lIGZvciBNdVRlY3QyLgoKYGBge3J9Cm11dGVjdDJfdmFmIDwtIG11dGVjdDJAZGF0YSAlPiUKICBkcGx5cjo6bXV0YXRlKAogICAgdmFmID0gYXMubnVtZXJpYyh0X2FsdF9jb3VudCkgLyAoYXMubnVtZXJpYyh0X3JlZl9jb3VudCkgKwogICAgICBhcy5udW1lcmljKHRfYWx0X2NvdW50KSksCiAgICBiYXNlX2NoYW5nZSA9IHBhc3RlMChSZWZlcmVuY2VfQWxsZWxlLCAiPiIsIEFsbGVsZSksCiAgICBjb2RpbmcgPSBkcGx5cjo6Y2FzZV93aGVuKAogICAgICBCSU9UWVBFICE9ICJwcm90ZWluX2NvZGluZyIgfiAibm9uLWNvZGluZyIsCiAgICAgIFRSVUUgfiAicHJvdGVpbl9jb2RpbmciCiAgICApCiAgKSAlPiUKICBkcGx5cjo6bXV0YXRlKGNoYW5nZSA9IGRwbHlyOjpjYXNlX3doZW4oCiAgICBncmVwbCgiXi0iLCBiYXNlX2NoYW5nZSkgfiAiaW5zZXJ0aW9uIiwKICAgIGdyZXBsKCItJCIsIGJhc2VfY2hhbmdlKSB+ICJkZWxldGlvbiIsCiAgICBuY2hhcihiYXNlX2NoYW5nZSkgPiAzIH4gImxvbmdfY2hhbmdlIiwKICAgIFRSVUUgfiBiYXNlX2NoYW5nZQogICkpICU+JQogIGRwbHlyOjptdXRhdGUoCiAgICBtdXRhdGlvbl9pZCA9IHBhc3RlMCgKICAgICAgSHVnb19TeW1ib2wsICJfIiwKICAgICAgY2hhbmdlLCAiXyIsCiAgICAgIFN0YXJ0X1Bvc2l0aW9uLCAiXyIsCiAgICAgIFR1bW9yX1NhbXBsZV9CYXJjb2RlCiAgICApLAogICAgZ2VuZXJhbF9pZCA9IHBhc3RlMChIdWdvX1N5bWJvbCwgIl8iLCBUdW1vcl9TYW1wbGVfQmFyY29kZSkKICApICU+JQogIGRwbHlyOjpzZWxlY3QoLXdoaWNoKGFwcGx5KGlzLm5hKC4pLCAyLCBhbGwpKSkKCiMgVGFrZSBhIGxvb2sgYXQgdGhpcyBkZgptdXRlY3QyX3ZhZgpgYGAKCiMjIENvbWJpbmUgTXVUZWN0MiBhbmQgU3RyZWxrYTIgZGF0YS5mcmFtZXMgaW50byBvbmUgZGF0YS5mcmFtZQoKU2F2ZSB0byBhIFRTViBmaWxlLgoKYGBge3J9CiMgTWVyZ2UgdGhlc2UgZGF0YS5mcmFtZXMgdG9nZXRoZXIKdmFmX2RmIDwtIHN0cmVsa2EyX3ZhZiAlPiUKICBkcGx5cjo6ZnVsbF9qb2luKG11dGVjdDJfdmFmLAogICAgYnkgPSAibXV0YXRpb25faWQiLAogICAgc3VmZml4ID0gYygiLnN0cmVsa2EyIiwgIi5tdXRlY3QyIikKICApICU+JQogICMgTWFrZSBhIHZhcmlhYmxlIHRoYXQgZGVub3RlcyB3aGljaCBkYXRhc2V0IGl0IGlzIGluLgogIGRwbHlyOjptdXRhdGUoZGF0YXNldCA9IGRwbHlyOjpjYXNlX3doZW4oCiAgICBpcy5uYShBbGxlbGUubXV0ZWN0MikgfiAic3RyZWxrYTJfb25seSIsCiAgICBpcy5uYShBbGxlbGUuc3RyZWxrYTIpIH4gIm11dGVjdDJfb25seSIsCiAgICBUUlVFIH4gImJvdGgiCiAgKSkgJT4lCiAgcmVhZHI6OndyaXRlX3RzdihmaWxlLnBhdGgoInJlc3VsdHMiLCAiY29tYmluZWRfcmVzdWx0cy50c3YiKSkKYGBgCgpTZXNzaW9uIEluZm86IAoKYGBge3J9CnNlc3Npb25JbmZvKCkKYGBgCg==